#ifndef CUFFTDX_FFT_28_FP32_FWD_PTX_HPP
#define CUFFTDX_FFT_28_FP32_FWD_PTX_HPP



template<> __forceinline__ __device__ void cufftdx_private_function<12, float, 1>(cufftdx::detail::complex<float> *rmem, unsigned smem){

asm volatile (R"({
.reg .f32 f<697>;
.reg .b64 rd<2>;
add.f32 f113, %66, %120;
add.f32 f114, %56, f113;
add.f32 f115, %77, %109;
add.f32 f116, f115, f114;
add.f32 f117, %88, %98;
add.f32 f118, f117, f116;
add.f32 f119, %68, %121;
add.f32 f120, %57, f119;
add.f32 f121, %79, %111;
add.f32 f122, f121, f120;
add.f32 f123, %89, %100;
add.f32 f124, f123, f122;
fma.rn.f32 f125, f113, 0f3F1F9D07, %56;
mul.f32 f126, f115, 0f3E63DC87;
sub.f32 f127, f125, f126;
mul.f32 f128, f117, 0f3F66A5E5;
sub.f32 f129, f127, f128;
sub.f32 f130, %68, %121;
mul.f32 f131, f130, 0f3F48261C;
sub.f32 f132, %79, %111;
mul.f32 f133, f132, 0fBF7994E0;
sub.f32 f134, f133, f131;
sub.f32 f135, %89, %100;
mul.f32 f136, f135, 0f3EDE2602;
sub.f32 f137, f134, f136;
sub.f32 f138, f129, f137;
add.f32 f139, f137, f129;
mul.f32 f140, f113, 0f3E63DC87;
sub.f32 f141, %56, f140;
mul.f32 f142, f115, 0f3F66A5E5;
sub.f32 f143, f141, f142;
fma.rn.f32 f144, f117, 0f3F1F9D07, f143;
mul.f32 f145, f130, 0f3F7994E0;
mul.f32 f146, f132, 0f3EDE2602;
sub.f32 f147, f146, f145;
fma.rn.f32 f148, f135, 0f3F48261C, f147;
sub.f32 f149, f144, f148;
add.f32 f150, f148, f144;
mul.f32 f151, f113, 0f3F66A5E5;
sub.f32 f152, %56, f151;
fma.rn.f32 f153, f115, 0f3F1F9D07, f152;
mul.f32 f154, f117, 0f3E63DC87;
sub.f32 f155, f153, f154;
mul.f32 f156, f130, 0f3EDE2602;
mul.f32 f157, f132, 0f3F48261C;
sub.f32 f158, f157, f156;
mul.f32 f159, f135, 0f3F7994E0;
sub.f32 f160, f158, f159;
sub.f32 f161, f155, f160;
add.f32 f162, f160, f155;
fma.rn.f32 f163, f119, 0f3F1F9D07, %57;
mul.f32 f164, f121, 0f3E63DC87;
sub.f32 f165, f163, f164;
mul.f32 f166, f123, 0f3F66A5E5;
sub.f32 f167, f165, f166;
sub.f32 f168, %66, %120;
mul.f32 f169, f168, 0f3F48261C;
sub.f32 f170, %77, %109;
mul.f32 f171, f170, 0fBF7994E0;
sub.f32 f172, f171, f169;
sub.f32 f173, %88, %98;
mul.f32 f174, f173, 0f3EDE2602;
sub.f32 f175, f172, f174;
add.f32 f176, f175, f167;
sub.f32 f177, f167, f175;
mul.f32 f178, f119, 0f3E63DC87;
sub.f32 f179, %57, f178;
mul.f32 f180, f121, 0f3F66A5E5;
sub.f32 f181, f179, f180;
fma.rn.f32 f182, f123, 0f3F1F9D07, f181;
mul.f32 f183, f168, 0f3F7994E0;
mul.f32 f184, f170, 0f3EDE2602;
sub.f32 f185, f184, f183;
fma.rn.f32 f186, f173, 0f3F48261C, f185;
add.f32 f187, f186, f182;
sub.f32 f188, f182, f186;
mul.f32 f189, f119, 0f3F66A5E5;
sub.f32 f190, %57, f189;
fma.rn.f32 f191, f121, 0f3F1F9D07, f190;
mul.f32 f192, f123, 0f3E63DC87;
sub.f32 f193, f191, f192;
mul.f32 f194, f168, 0f3EDE2602;
mul.f32 f195, f170, 0f3F48261C;
sub.f32 f196, f195, f194;
mul.f32 f197, f173, 0f3F7994E0;
sub.f32 f198, f196, f197;
add.f32 f199, f198, f193;
sub.f32 f200, f193, f198;
add.f32 f201, %72, %125;
add.f32 f202, %61, f201;
add.f32 f203, %82, %114;
add.f32 f204, f203, f202;
add.f32 f205, %93, %104;
add.f32 f206, f205, f204;
add.f32 f207, %73, %127;
add.f32 f208, %63, f207;
add.f32 f209, %84, %116;
add.f32 f210, f209, f208;
add.f32 f211, %95, %105;
add.f32 f212, f211, f210;
fma.rn.f32 f213, f201, 0f3F1F9D07, %61;
mul.f32 f214, f203, 0f3E63DC87;
sub.f32 f215, f213, f214;
mul.f32 f216, f205, 0f3F66A5E5;
sub.f32 f217, f215, f216;
sub.f32 f218, %73, %127;
mul.f32 f219, f218, 0f3F48261C;
sub.f32 f220, %84, %116;
mul.f32 f221, f220, 0fBF7994E0;
sub.f32 f222, f221, f219;
sub.f32 f223, %95, %105;
mul.f32 f224, f223, 0f3EDE2602;
sub.f32 f225, f222, f224;
sub.f32 f226, f217, f225;
add.f32 f227, f225, f217;
mul.f32 f228, f201, 0f3E63DC87;
sub.f32 f229, %61, f228;
mul.f32 f230, f203, 0f3F66A5E5;
sub.f32 f231, f229, f230;
fma.rn.f32 f232, f205, 0f3F1F9D07, f231;
mul.f32 f233, f218, 0f3F7994E0;
mul.f32 f234, f220, 0f3EDE2602;
sub.f32 f235, f234, f233;
fma.rn.f32 f236, f223, 0f3F48261C, f235;
sub.f32 f237, f232, f236;
add.f32 f238, f236, f232;
mul.f32 f239, f201, 0f3F66A5E5;
sub.f32 f240, %61, f239;
fma.rn.f32 f241, f203, 0f3F1F9D07, f240;
mul.f32 f242, f205, 0f3E63DC87;
sub.f32 f243, f241, f242;
mul.f32 f244, f218, 0f3EDE2602;
mul.f32 f245, f220, 0f3F48261C;
sub.f32 f246, f245, f244;
mul.f32 f247, f223, 0f3F7994E0;
sub.f32 f248, f246, f247;
sub.f32 f249, f243, f248;
add.f32 f250, f248, f243;
fma.rn.f32 f251, f207, 0f3F1F9D07, %63;
mul.f32 f252, f209, 0f3E63DC87;
sub.f32 f253, f251, f252;
mul.f32 f254, f211, 0f3F66A5E5;
sub.f32 f255, f253, f254;
sub.f32 f256, %72, %125;
mul.f32 f257, f256, 0f3F48261C;
sub.f32 f258, %82, %114;
mul.f32 f259, f258, 0fBF7994E0;
sub.f32 f260, f259, f257;
sub.f32 f261, %93, %104;
mul.f32 f262, f261, 0f3EDE2602;
sub.f32 f263, f260, f262;
add.f32 f264, f263, f255;
sub.f32 f265, f255, f263;
mul.f32 f266, f207, 0f3E63DC87;
sub.f32 f267, %63, f266;
mul.f32 f268, f209, 0f3F66A5E5;
sub.f32 f269, f267, f268;
fma.rn.f32 f270, f211, 0f3F1F9D07, f269;
mul.f32 f271, f256, 0f3F7994E0;
mul.f32 f272, f258, 0f3EDE2602;
sub.f32 f273, f272, f271;
fma.rn.f32 f274, f261, 0f3F48261C, f273;
add.f32 f275, f274, f270;
sub.f32 f276, f270, f274;
mul.f32 f277, f207, 0f3F66A5E5;
sub.f32 f278, %63, f277;
fma.rn.f32 f279, f209, 0f3F1F9D07, f278;
mul.f32 f280, f211, 0f3E63DC87;
sub.f32 f281, f279, f280;
mul.f32 f282, f256, 0f3EDE2602;
mul.f32 f283, f258, 0f3F48261C;
sub.f32 f284, f283, f282;
mul.f32 f285, f261, 0f3F7994E0;
sub.f32 f286, f284, f285;
add.f32 f287, f286, f281;
sub.f32 f288, f281, f286;
mul.f32 f289, f226, 0f3F66A5E5;
mul.f32 f290, f264, 0fBEDE2602;
sub.f32 f291, f289, f290;
mul.f32 f292, f264, 0f3F66A5E5;
fma.rn.f32 f293, f226, 0fBEDE2602, f292;
mul.f32 f294, f237, 0f3F1F9D07;
mul.f32 f295, f275, 0fBF48261C;
sub.f32 f296, f294, f295;
mul.f32 f297, f275, 0f3F1F9D07;
fma.rn.f32 f298, f237, 0fBF48261C, f297;
mul.f32 f299, f249, 0f3E63DC87;
mul.f32 f300, f287, 0fBF7994E0;
sub.f32 f301, f299, f300;
mul.f32 f302, f287, 0f3E63DC87;
fma.rn.f32 f303, f249, 0fBF7994E0, f302;
mul.f32 f304, f250, 0fBE63DC87;
mul.f32 f305, f288, 0fBF7994E0;
sub.f32 f306, f304, f305;
mul.f32 f307, f288, 0fBE63DC87;
fma.rn.f32 f308, f250, 0fBF7994E0, f307;
mul.f32 f309, f238, 0fBF1F9D07;
mul.f32 f310, f276, 0fBF48261C;
sub.f32 f311, f309, f310;
mul.f32 f312, f276, 0fBF1F9D07;
fma.rn.f32 f313, f238, 0fBF48261C, f312;
mul.f32 f314, f227, 0fBF66A5E5;
mul.f32 f315, f265, 0fBEDE2602;
sub.f32 f316, f314, f315;
mul.f32 f317, f265, 0fBF66A5E5;
fma.rn.f32 f318, f227, 0fBEDE2602, f317;
add.f32 f319, f118, f206;
add.f32 f320, f124, f212;
sub.f32 f321, f118, f206;
sub.f32 f322, f124, f212;
add.f32 f323, f138, f291;
add.f32 f324, f176, f293;
sub.f32 f325, f138, f291;
sub.f32 f326, f176, f293;
add.f32 f327, f149, f296;
add.f32 f328, f187, f298;
sub.f32 f329, f149, f296;
sub.f32 f330, f187, f298;
add.f32 f331, f161, f301;
add.f32 f332, f199, f303;
sub.f32 f333, f161, f301;
sub.f32 f334, f199, f303;
add.f32 f335, f162, f306;
add.f32 f336, f200, f308;
sub.f32 f337, f162, f306;
sub.f32 f338, f200, f308;
add.f32 f339, f150, f311;
add.f32 f340, f188, f313;
sub.f32 f341, f150, f311;
sub.f32 f342, f188, f313;
add.f32 f343, f139, f316;
add.f32 f344, f177, f318;
sub.f32 f345, f139, f316;
sub.f32 f346, f177, f318;
add.f32 f347, %69, %122;
add.f32 f348, %58, f347;
add.f32 f349, %80, %112;
add.f32 f350, f349, f348;
add.f32 f351, %90, %101;
add.f32 f352, f351, f350;
add.f32 f353, %71, %124;
add.f32 f354, %60, f353;
add.f32 f355, %81, %113;
add.f32 f356, f355, f354;
add.f32 f357, %92, %103;
add.f32 f358, f357, f356;
fma.rn.f32 f359, f347, 0f3F1F9D07, %58;
mul.f32 f360, f349, 0f3E63DC87;
sub.f32 f361, f359, f360;
mul.f32 f362, f351, 0f3F66A5E5;
sub.f32 f363, f361, f362;
sub.f32 f364, %71, %124;
mul.f32 f365, f364, 0f3F48261C;
sub.f32 f366, %81, %113;
mul.f32 f367, f366, 0fBF7994E0;
sub.f32 f368, f367, f365;
sub.f32 f369, %92, %103;
mul.f32 f370, f369, 0f3EDE2602;
sub.f32 f371, f368, f370;
sub.f32 f372, f363, f371;
add.f32 f373, f371, f363;
mul.f32 f374, f347, 0f3E63DC87;
sub.f32 f375, %58, f374;
mul.f32 f376, f349, 0f3F66A5E5;
sub.f32 f377, f375, f376;
fma.rn.f32 f378, f351, 0f3F1F9D07, f377;
mul.f32 f379, f364, 0f3F7994E0;
mul.f32 f380, f366, 0f3EDE2602;
sub.f32 f381, f380, f379;
fma.rn.f32 f382, f369, 0f3F48261C, f381;
sub.f32 f383, f378, f382;
add.f32 f384, f382, f378;
mul.f32 f385, f347, 0f3F66A5E5;
sub.f32 f386, %58, f385;
fma.rn.f32 f387, f349, 0f3F1F9D07, f386;
mul.f32 f388, f351, 0f3E63DC87;
sub.f32 f389, f387, f388;
mul.f32 f390, f364, 0f3EDE2602;
mul.f32 f391, f366, 0f3F48261C;
sub.f32 f392, f391, f390;
mul.f32 f393, f369, 0f3F7994E0;
sub.f32 f394, f392, f393;
sub.f32 f395, f389, f394;
add.f32 f396, f394, f389;
fma.rn.f32 f397, f353, 0f3F1F9D07, %60;
mul.f32 f398, f355, 0f3E63DC87;
sub.f32 f399, f397, f398;
mul.f32 f400, f357, 0f3F66A5E5;
sub.f32 f401, f399, f400;
sub.f32 f402, %69, %122;
mul.f32 f403, f402, 0f3F48261C;
sub.f32 f404, %80, %112;
mul.f32 f405, f404, 0fBF7994E0;
sub.f32 f406, f405, f403;
sub.f32 f407, %90, %101;
mul.f32 f408, f407, 0f3EDE2602;
sub.f32 f409, f406, f408;
add.f32 f410, f409, f401;
sub.f32 f411, f401, f409;
mul.f32 f412, f353, 0f3E63DC87;
sub.f32 f413, %60, f412;
mul.f32 f414, f355, 0f3F66A5E5;
sub.f32 f415, f413, f414;
fma.rn.f32 f416, f357, 0f3F1F9D07, f415;
mul.f32 f417, f402, 0f3F7994E0;
mul.f32 f418, f404, 0f3EDE2602;
sub.f32 f419, f418, f417;
fma.rn.f32 f420, f407, 0f3F48261C, f419;
add.f32 f421, f420, f416;
sub.f32 f422, f416, f420;
mul.f32 f423, f353, 0f3F66A5E5;
sub.f32 f424, %60, f423;
fma.rn.f32 f425, f355, 0f3F1F9D07, f424;
mul.f32 f426, f357, 0f3E63DC87;
sub.f32 f427, f425, f426;
mul.f32 f428, f402, 0f3EDE2602;
mul.f32 f429, f404, 0f3F48261C;
sub.f32 f430, f429, f428;
mul.f32 f431, f407, 0f3F7994E0;
sub.f32 f432, f430, f431;
add.f32 f433, f432, f427;
sub.f32 f434, f427, f432;
add.f32 f435, %74, %128;
add.f32 f436, %64, f435;
add.f32 f437, %85, %117;
add.f32 f438, f437, f436;
add.f32 f439, %96, %106;
add.f32 f440, f439, f438;
add.f32 f441, %76, %129;
add.f32 f442, %65, f441;
add.f32 f443, %87, %119;
add.f32 f444, f443, f442;
add.f32 f445, %97, %108;
add.f32 f446, f445, f444;
fma.rn.f32 f447, f435, 0f3F1F9D07, %64;
mul.f32 f448, f437, 0f3E63DC87;
sub.f32 f449, f447, f448;
mul.f32 f450, f439, 0f3F66A5E5;
sub.f32 f451, f449, f450;
sub.f32 f452, %76, %129;
mul.f32 f453, f452, 0f3F48261C;
sub.f32 f454, %87, %119;
mul.f32 f455, f454, 0fBF7994E0;
sub.f32 f456, f455, f453;
sub.f32 f457, %97, %108;
mul.f32 f458, f457, 0f3EDE2602;
sub.f32 f459, f456, f458;
sub.f32 f460, f451, f459;
add.f32 f461, f459, f451;
mul.f32 f462, f435, 0f3E63DC87;
sub.f32 f463, %64, f462;
mul.f32 f464, f437, 0f3F66A5E5;
sub.f32 f465, f463, f464;
fma.rn.f32 f466, f439, 0f3F1F9D07, f465;
mul.f32 f467, f452, 0f3F7994E0;
mul.f32 f468, f454, 0f3EDE2602;
sub.f32 f469, f468, f467;
fma.rn.f32 f470, f457, 0f3F48261C, f469;
sub.f32 f471, f466, f470;
add.f32 f472, f470, f466;
mul.f32 f473, f435, 0f3F66A5E5;
sub.f32 f474, %64, f473;
fma.rn.f32 f475, f437, 0f3F1F9D07, f474;
mul.f32 f476, f439, 0f3E63DC87;
sub.f32 f477, f475, f476;
mul.f32 f478, f452, 0f3EDE2602;
mul.f32 f479, f454, 0f3F48261C;
sub.f32 f480, f479, f478;
mul.f32 f481, f457, 0f3F7994E0;
sub.f32 f482, f480, f481;
sub.f32 f483, f477, f482;
add.f32 f484, f482, f477;
fma.rn.f32 f485, f441, 0f3F1F9D07, %65;
mul.f32 f486, f443, 0f3E63DC87;
sub.f32 f487, f485, f486;
mul.f32 f488, f445, 0f3F66A5E5;
sub.f32 f489, f487, f488;
sub.f32 f490, %74, %128;
mul.f32 f491, f490, 0f3F48261C;
sub.f32 f492, %85, %117;
mul.f32 f493, f492, 0fBF7994E0;
sub.f32 f494, f493, f491;
sub.f32 f495, %96, %106;
mul.f32 f496, f495, 0f3EDE2602;
sub.f32 f497, f494, f496;
add.f32 f498, f497, f489;
sub.f32 f499, f489, f497;
mul.f32 f500, f441, 0f3E63DC87;
sub.f32 f501, %65, f500;
mul.f32 f502, f443, 0f3F66A5E5;
sub.f32 f503, f501, f502;
fma.rn.f32 f504, f445, 0f3F1F9D07, f503;
mul.f32 f505, f490, 0f3F7994E0;
mul.f32 f506, f492, 0f3EDE2602;
sub.f32 f507, f506, f505;
fma.rn.f32 f508, f495, 0f3F48261C, f507;
add.f32 f509, f508, f504;
sub.f32 f510, f504, f508;
mul.f32 f511, f441, 0f3F66A5E5;
sub.f32 f512, %65, f511;
fma.rn.f32 f513, f443, 0f3F1F9D07, f512;
mul.f32 f514, f445, 0f3E63DC87;
sub.f32 f515, f513, f514;
mul.f32 f516, f490, 0f3EDE2602;
mul.f32 f517, f492, 0f3F48261C;
sub.f32 f518, f517, f516;
mul.f32 f519, f495, 0f3F7994E0;
sub.f32 f520, f518, f519;
add.f32 f521, f520, f515;
sub.f32 f522, f515, f520;
mul.f32 f523, f460, 0f3F66A5E5;
mul.f32 f524, f498, 0fBEDE2602;
sub.f32 f525, f523, f524;
mul.f32 f526, f498, 0f3F66A5E5;
fma.rn.f32 f527, f460, 0fBEDE2602, f526;
mul.f32 f528, f471, 0f3F1F9D07;
mul.f32 f529, f509, 0fBF48261C;
sub.f32 f530, f528, f529;
mul.f32 f531, f509, 0f3F1F9D07;
fma.rn.f32 f532, f471, 0fBF48261C, f531;
mul.f32 f533, f483, 0f3E63DC87;
mul.f32 f534, f521, 0fBF7994E0;
sub.f32 f535, f533, f534;
mul.f32 f536, f521, 0f3E63DC87;
fma.rn.f32 f537, f483, 0fBF7994E0, f536;
mul.f32 f538, f484, 0fBE63DC87;
mul.f32 f539, f522, 0fBF7994E0;
sub.f32 f540, f538, f539;
mul.f32 f541, f522, 0fBE63DC87;
fma.rn.f32 f542, f484, 0fBF7994E0, f541;
mul.f32 f543, f472, 0fBF1F9D07;
mul.f32 f544, f510, 0fBF48261C;
sub.f32 f545, f543, f544;
mul.f32 f546, f510, 0fBF1F9D07;
fma.rn.f32 f547, f472, 0fBF48261C, f546;
mul.f32 f548, f461, 0fBF66A5E5;
mul.f32 f549, f499, 0fBEDE2602;
sub.f32 f550, f548, f549;
mul.f32 f551, f499, 0fBF66A5E5;
fma.rn.f32 f552, f461, 0fBEDE2602, f551;
add.f32 f553, f352, f440;
add.f32 f554, f358, f446;
sub.f32 f555, f352, f440;
sub.f32 f556, f358, f446;
add.f32 f557, f372, f525;
add.f32 f558, f410, f527;
sub.f32 f559, f372, f525;
sub.f32 f560, f410, f527;
add.f32 f561, f383, f530;
add.f32 f562, f421, f532;
sub.f32 f563, f383, f530;
sub.f32 f564, f421, f532;
add.f32 f565, f395, f535;
add.f32 f566, f433, f537;
sub.f32 f567, f395, f535;
sub.f32 f568, f433, f537;
add.f32 f569, f396, f540;
add.f32 f570, f434, f542;
sub.f32 f571, f396, f540;
sub.f32 f572, f434, f542;
add.f32 f573, f384, f545;
add.f32 f574, f422, f547;
sub.f32 f575, f384, f545;
sub.f32 f576, f422, f547;
add.f32 f577, f373, f550;
add.f32 f578, f411, f552;
sub.f32 f579, f373, f550;
sub.f32 f580, f411, f552;
mul.f32 f581, f557, 0f3F7994E0;
mul.f32 f582, f558, 0fBE63DC87;
sub.f32 f583, f581, f582;
mul.f32 f584, f558, 0f3F7994E0;
fma.rn.f32 f585, f557, 0fBE63DC87, f584;
mul.f32 f586, f561, 0f3F66A5E5;
mul.f32 f587, f562, 0fBEDE2602;
sub.f32 f588, f586, f587;
mul.f32 f589, f562, 0f3F66A5E5;
fma.rn.f32 f590, f561, 0fBEDE2602, f589;
mul.f32 f591, f565, 0f3F48261C;
mul.f32 f592, f566, 0fBF1F9D07;
sub.f32 f593, f591, f592;
mul.f32 f594, f566, 0f3F48261C;
fma.rn.f32 f595, f565, 0fBF1F9D07, f594;
mul.f32 f596, f569, 0f3F1F9D07;
mul.f32 f597, f570, 0fBF48261C;
sub.f32 f598, f596, f597;
mul.f32 f599, f570, 0f3F1F9D07;
fma.rn.f32 f600, f569, 0fBF48261C, f599;
mul.f32 f601, f573, 0f3EDE2602;
mul.f32 f602, f574, 0fBF66A5E5;
sub.f32 f603, f601, f602;
mul.f32 f604, f574, 0f3EDE2602;
fma.rn.f32 f605, f573, 0fBF66A5E5, f604;
mul.f32 f606, f577, 0f3E63DC87;
mul.f32 f607, f578, 0fBF7994E0;
sub.f32 f608, f606, f607;
mul.f32 f609, f578, 0f3E63DC87;
fma.rn.f32 f610, f577, 0fBF7994E0, f609;
mul.f32 f611, f559, 0fBE63DC87;
mul.f32 f612, f560, 0fBF7994E0;
sub.f32 f613, f611, f612;
mul.f32 f614, f560, 0fBE63DC87;
fma.rn.f32 f615, f559, 0fBF7994E0, f614;
mul.f32 f616, f563, 0fBEDE2602;
mul.f32 f617, f564, 0fBF66A5E5;
sub.f32 f618, f616, f617;
mul.f32 f619, f564, 0fBEDE2602;
fma.rn.f32 f620, f563, 0fBF66A5E5, f619;
mul.f32 f621, f567, 0fBF1F9D07;
mul.f32 f622, f568, 0fBF48261C;
sub.f32 f623, f621, f622;
mul.f32 f624, f568, 0fBF1F9D07;
fma.rn.f32 f625, f567, 0fBF48261C, f624;
mul.f32 f626, f571, 0fBF48261C;
mul.f32 f627, f572, 0fBF1F9D07;
sub.f32 f628, f626, f627;
mul.f32 f629, f572, 0fBF48261C;
fma.rn.f32 f630, f571, 0fBF1F9D07, f629;
mul.f32 f631, f575, 0fBF66A5E5;
mul.f32 f632, f576, 0fBEDE2602;
sub.f32 f633, f631, f632;
mul.f32 f634, f576, 0fBF66A5E5;
fma.rn.f32 f635, f575, 0fBEDE2602, f634;
mul.f32 f636, f579, 0fBF7994E0;
mul.f32 f637, f580, 0fBE63DC87;
sub.f32 f638, f636, f637;
mul.f32 f639, f580, 0fBF7994E0;
fma.rn.f32 f640, f579, 0fBE63DC87, f639;
add.f32 %1, f320, f554;
add.f32 %0, f319, f553;
add.f32 %3, f324, f585;
add.f32 %2, f323, f583;
add.f32 %5, f328, f590;
add.f32 %4, f327, f588;
add.f32 %7, f332, f595;
add.f32 %6, f331, f593;
add.f32 %9, f336, f600;
add.f32 %8, f335, f598;
add.f32 %11, f340, f605;
add.f32 %10, f339, f603;
add.f32 %13, f344, f610;
add.f32 %12, f343, f608;
sub.f32 %15, f322, f555;
add.f32 %14, f321, f556;
add.f32 %17, f326, f615;
add.f32 %16, f325, f613;
add.f32 %19, f330, f620;
add.f32 %18, f329, f618;
add.f32 %21, f334, f625;
add.f32 %20, f333, f623;
add.f32 %23, f338, f630;
add.f32 %22, f337, f628;
add.f32 %25, f342, f635;
add.f32 %24, f341, f633;
add.f32 %27, f346, f640;
add.f32 %26, f345, f638;
sub.f32 %29, f320, f554;
sub.f32 %28, f319, f553;
sub.f32 %31, f324, f585;
sub.f32 %30, f323, f583;
sub.f32 %33, f328, f590;
sub.f32 %32, f327, f588;
sub.f32 %35, f332, f595;
sub.f32 %34, f331, f593;
sub.f32 %37, f336, f600;
sub.f32 %36, f335, f598;
sub.f32 %39, f340, f605;
sub.f32 %38, f339, f603;
sub.f32 %41, f344, f610;
sub.f32 %40, f343, f608;
add.f32 %43, f322, f555;
sub.f32 %42, f321, f556;
sub.f32 %45, f326, f615;
sub.f32 %44, f325, f613;
sub.f32 %47, f330, f620;
sub.f32 %46, f329, f618;
sub.f32 %49, f334, f625;
sub.f32 %48, f333, f623;
sub.f32 %51, f338, f630;
sub.f32 %50, f337, f628;
sub.f32 %53, f342, f635;
sub.f32 %52, f341, f633;
sub.f32 %55, f346, f640;
sub.f32 %54, f345, f638;
})"
     : "=f"(rmem[0].x), "=f"(rmem[0].y), "=f"(rmem[1].x), "=f"(rmem[1].y), "=f"(rmem[2].x), "=f"(rmem[2].y), "=f"(rmem[3].x), "=f"(rmem[3].y), "=f"(rmem[4].x), "=f"(rmem[4].y), "=f"(rmem[5].x), "=f"(rmem[5].y), "=f"(rmem[6].x), "=f"(rmem[6].y), "=f"(rmem[7].x), "=f"(rmem[7].y), "=f"(rmem[8].x), "=f"(rmem[8].y), "=f"(rmem[9].x), "=f"(rmem[9].y), "=f"(rmem[10].x), "=f"(rmem[10].y), "=f"(rmem[11].x), "=f"(rmem[11].y), "=f"(rmem[12].x), "=f"(rmem[12].y), "=f"(rmem[13].x), "=f"(rmem[13].y), "=f"(rmem[14].x), "=f"(rmem[14].y), "=f"(rmem[15].x), "=f"(rmem[15].y), "=f"(rmem[16].x), "=f"(rmem[16].y), "=f"(rmem[17].x), "=f"(rmem[17].y), "=f"(rmem[18].x), "=f"(rmem[18].y), "=f"(rmem[19].x), "=f"(rmem[19].y), "=f"(rmem[20].x), "=f"(rmem[20].y), "=f"(rmem[21].x), "=f"(rmem[21].y), "=f"(rmem[22].x), "=f"(rmem[22].y), "=f"(rmem[23].x), "=f"(rmem[23].y), "=f"(rmem[24].x), "=f"(rmem[24].y), "=f"(rmem[25].x), "=f"(rmem[25].y), "=f"(rmem[26].x), "=f"(rmem[26].y), "=f"(rmem[27].x), "=f"(rmem[27].y): "f"(rmem[0].x), "f"(rmem[0].y), "f"(rmem[1].x), "f"(rmem[1].y), "f"(rmem[1].y), "f"(rmem[2].x), "f"(rmem[2].y), "f"(rmem[2].y), "f"(rmem[3].x), "f"(rmem[3].y), "f"(rmem[4].x), "f"(rmem[4].y), "f"(rmem[4].y), "f"(rmem[5].x), "f"(rmem[5].y), "f"(rmem[5].y), "f"(rmem[6].x), "f"(rmem[6].y), "f"(rmem[7].x), "f"(rmem[7].y), "f"(rmem[7].y), "f"(rmem[8].x), "f"(rmem[8].y), "f"(rmem[8].y), "f"(rmem[9].x), "f"(rmem[9].y), "f"(rmem[10].x), "f"(rmem[10].y), "f"(rmem[10].y), "f"(rmem[11].x), "f"(rmem[11].y), "f"(rmem[11].y), "f"(rmem[12].x), "f"(rmem[12].y), "f"(rmem[13].x), "f"(rmem[13].y), "f"(rmem[13].y), "f"(rmem[14].x), "f"(rmem[14].y), "f"(rmem[14].y), "f"(rmem[15].x), "f"(rmem[15].y), "f"(rmem[16].x), "f"(rmem[16].y), "f"(rmem[16].y), "f"(rmem[17].x), "f"(rmem[17].y), "f"(rmem[17].y), "f"(rmem[18].x), "f"(rmem[18].y), "f"(rmem[19].x), "f"(rmem[19].y), "f"(rmem[19].y), "f"(rmem[20].x), "f"(rmem[20].y), "f"(rmem[20].y), "f"(rmem[21].x), "f"(rmem[21].y), "f"(rmem[22].x), "f"(rmem[22].y), "f"(rmem[22].y), "f"(rmem[23].x), "f"(rmem[23].y), "f"(rmem[23].y), "f"(rmem[24].x), "f"(rmem[24].y), "f"(rmem[25].x), "f"(rmem[25].y), "f"(rmem[25].y), "f"(rmem[26].x), "f"(rmem[26].y), "f"(rmem[26].y), "f"(rmem[27].x), "f"(rmem[27].y));
};


#endif
